a8cedeb07d3f12d5f2e7207090a573e7df78e8b6,rl4j-core/src/main/java/org/deeplearning4j/rl4j/network/ac/ActorCriticFactoryStdConv.java,ActorCriticFactoryStdConv,buildActorCritic,#number#number#,29
Before Change
.optimizationAlgo(OptimizationAlgorithm.STOCHASTIC_GRADIENT_DESCENT)
.learningRate(conf.getLearningRate())
//.updater(Updater.NESTEROVS).momentum(0.9)
.updater(Updater.RMSPROP).rmsDecay(conf.getRmsDecay())
.weightInit(WeightInit.XAVIER)
.regularization(true)
.l2(conf.getL2())
.graphBuilder()
After Change
.learningRate(conf.getLearningRate())
//.updater(Updater.NESTEROVS).momentum(0.9)
//.updater(Updater.RMSPROP).rmsDecay(conf.getRmsDecay())
.updater(Updater.ADAM)
.weightInit(WeightInit.XAVIER)
.regularization(true)
.l2(conf.getL2())
.graphBuilder()